__kernel
void csr_opencl_twodev(__global float *values, __global float *v, __global int *colIdx, __global int *rowPtr, const int rows, __global float *answer, const int offSet) {
  const int __idx = get_global_id(0);

	if(__idx >= rows)
		return;
	
	float accumulator = 0;
	int _row = __idx;
	
	for(int i = rowPtr[_row] - offSet; i < rowPtr[_row + 1] - offSet; i++) {
		int _col = colIdx[i];
		accumulator += values[i] * v[_col];
	}

	answer[__idx] = accumulator;
	//answer[__idx] = offSet;
}